export VLLM_ENGINE_ITERATION_TIMEOUT_S=36000
export VLLM_RPC_TIMEOUT=36000000

vllm serve /mnt/share/1/Qwen/Qwen3-32B-AWQ --served_model_name "qwen3-32-awq" -tp 2 --max-model-len $[32*1024] --enable-reasoning --reasoning-parser qwen3 --disable_log_stats --trust-remote-code --host 0.0.0.0 --port 8000